package com.zzvcom.office.docx4jutil;

import cn.hutool.core.util.StrUtil;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.select.Elements;

public class HtmlToXhtml implements java.io.Serializable {
    /**
     * 转过的xhtml
     */
    private String xHtml;


    /**
     * html转成xhtml
     * @param html
     */
    private void toXHTML(String html) {
        final Document document = Jsoup.parse(html);
        document.outputSettings().syntax(Document.OutputSettings.Syntax.xml);
        //https://github.com/plutext/docx4j/issues/79



        xHtml= document.html().replace("&nbsp;", "\u00A0");
    }
}
